<?php
	require("tokenizer.php");
	$file="Article_page.html";
	
	$text = file2string($file);
	$text = convert2utf($text);
	$urls = extract_html_urls($text);
	$text = strip_html_tags($text);
	$text = strip_punctuation($text);
	$text = strip_numbers($text);
	$words = stemText($text);
	$keywordCount = countWords($words);
	$keywords = getKeywords($keywordCount);
	

	print_r($keywords);
	
	//echo '\'';
	

?>